# This file is generated by battle_generator.py

joke-animals-vs-fruits:
  id: joke-animals-vs-fruits.dev.v0
  metrics: [accuracy]
joke-animals-vs-fruits.dev.v0:
  class: evals.elsuite.modelgraded.classify:ModelBasedClassify
  args:
    samples_jsonl: test_multiio/battles/joke_animals_vs_fruits.jsonl
    eval_type: cot_classify
    modelgraded_spec: battle

rap-people-vs-people:
  id: rap-people-vs-people.dev.v0
  metrics: [accuracy]
rap-people-vs-people.dev.v0:
  class: evals.elsuite.modelgraded.classify:ModelBasedClassify
  args:
    samples_jsonl: test_multiio/battles/rap_people_vs_people.jsonl
    eval_type: cot_classify
    modelgraded_spec: battle

rap-animals-vs-fruits:
  id: rap-animals-vs-fruits.dev.v0
  metrics: [accuracy]
rap-animals-vs-fruits.dev.v0:
  class: evals.elsuite.modelgraded.classify:ModelBasedClassify
  args:
    samples_jsonl: test_multiio/battles/rap_animals_vs_fruits.jsonl
    eval_type: cot_classify
    modelgraded_spec: battle

rap-people-vs-fruits:
  id: rap-people-vs-fruits.dev.v0
  metrics: [accuracy]
rap-people-vs-fruits.dev.v0:
  class: evals.elsuite.modelgraded.classify:ModelBasedClassify
  args:
    samples_jsonl: test_multiio/battles/rap_people_vs_fruits.jsonl
    eval_type: cot_classify
    modelgraded_spec: battle